__kernel void matrixmultiply(__global float* inmatrix, __global float* inrotation)
{
	__private int col = get_global_id(0)*4;
	float4 incol = (float4)(inmatrix[col], inmatrix[col+1], inmatrix[col+2], inmatrix[col+3]);
	
	for (int row = 0; row < 4; row++)
	{
		float4 inrot = (float4)(inrotation[row], inrotation[row+4], inrotation[row+8], inrotation[row+12]);
		inmatrix[col+row] = dot(incol, inrot);
	}
}